import urllib.request
from lxml import etree

url = 'https://www.baidu.com'

headers = {
    'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/134.0.0.0 Safari/537.36'
}

request = urllib.request.Request(url, headers=headers)

response = urllib.request.urlopen(request)

content = response.read().decode('utf-8')
# print(content)

# 解析网页源码 获取我们想要的数据
# 解析服务器响应的文件
tree = etree.HTML(content)

result = tree.xpath("//input[@id='su']/@value")[0]
print(result)

